Dimensions: 2749 85

[1] “patient”

Variable patient

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 0.04 %

Nº Categories = 2749

Table continues below
TCGA-02-0047 TCGA-02-0055 TCGA-02-2486 TCGA-04-1348 TCGA-04-1357
0.03638 0.03638 0.03638 0.03638 0.03638
TCGA-04-1362 TCGA-04-1364 TCGA-04-1514 TCGA-05-4249 TCGA-05-4250
0.03638 0.03638 0.03638 0.03638 0.03638

[1] “sample”

Variable sample

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 0.04 %

Nº Categories = 2749

Table continues below
TCGA-02-0047-01A TCGA-02-0055-01A TCGA-02-2486-01A TCGA-04-1348-01A
0.03638 0.03638 0.03638 0.03638
Table continues below
TCGA-04-1357-01A TCGA-04-1362-01A TCGA-04-1364-01A TCGA-04-1514-01A
0.03638 0.03638 0.03638 0.03638
TCGA-05-4249-01A TCGA-05-4250-01A
0.03638 0.03638

[1] “shortlettercode”

Variable shortlettercode

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[min,max]=[ TP , TP ]

Values: TP

Nº Categories = 1

TP
100

[1] “definition”

Variable definition

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[min,max]=[ Primary solid Tumor , Primary solid Tumor ]

Values: Primary solid Tumor

Nº Categories = 1

Primary solid Tumor
100

[1] “sample_submitter_id”

Variable sample_submitter_id

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 0.04 %

Nº Categories = 2749

Table continues below
TCGA-02-0047-01A TCGA-02-0055-01A TCGA-02-2486-01A TCGA-04-1348-01A
0.03638 0.03638 0.03638 0.03638
Table continues below
TCGA-04-1357-01A TCGA-04-1362-01A TCGA-04-1364-01A TCGA-04-1514-01A
0.03638 0.03638 0.03638 0.03638
TCGA-05-4249-01A TCGA-05-4250-01A
0.03638 0.03638

[1] “sample_type_id”

Variable sample_type_id

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[min,max]=[ 01 , 01 ]

Values: 01

Nº Categories = 1

01
100

[1] “tumor_descriptor”

Variable tumor_descriptor

Nas ratio = 74.21 %

Nas ratio_2 = 0 %

Nas dif_ratio = -74.21 %

Main value % = 100 %

[min,max]=[ Not Reported , Not Reported ]

Values: Not Reported

Nº Categories = 1

Not Reported
100

[1] “sample_id”

Variable sample_id

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 0.04 %

Nº Categories = 2749

Table continues below
0050544d-d812-4a18-8370-96d629b487ab 005f1dd8-49e2-4448-b37e-ac9fcffb02d6
0.03638 0.03638
Table continues below
0072bb9f-bed6-44df-800c-9637019b4707 0096c7fb-34e3-4d0f-ba81-3559cc00080a
0.03638 0.03638
Table continues below
009e66cd-fcdf-4a91-a2d8-7b9485ca29e1 00be5ec1-3b0f-4b5a-b116-4efce25d2cc8
0.03638 0.03638
Table continues below
00e66db2-da46-4003-9853-72b482d29999 01069064-dc19-4e9b-b96d-c8473ef954ee
0.03638 0.03638
01079b02-ab3b-4f17-b54c-0f774ac572b2 0109063d-7bc6-4973-8c67-98e48a2a2e4e
0.03638 0.03638

[1] “sample_type”

Variable sample_type

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[min,max]=[ Primary Tumor , Primary Tumor ]

Values: Primary Tumor

Nº Categories = 1

Primary Tumor
100

[1] “composition”

Variable composition

Nas ratio = 74.21 %

Nas ratio_2 = 0 %

Nas dif_ratio = -74.21 %

Main value % = 100 %

[min,max]=[ Not Reported , Not Reported ]

Values: Not Reported

Nº Categories = 1

Not Reported
100

[1] “days_to_collection”

Variable days_to_collection

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 75.52 %

[min,max]=[ -138 , 7290 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
-138 0 0 161.9443 0 7290

[1] “state”

Variable state

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[min,max]=[ released , released ]

Values: released

Nº Categories = 1

released
100

[1] “initial_weight”

Variable initial_weight

Nas ratio = 71.92 %

Nas ratio_2 = 0 %

Nas dif_ratio = -71.92 %

Main value % = 4.53 %

[min,max]=[ 1 , 2420 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
1 120 230 325.4858 412.5 2420

[1] “pathology_report_uuid”

Variable pathology_report_uuid

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 0.04 %

Nº Categories = 2749

Table continues below
00037eac-1ab2-45ff-869a-e6a7c6580a1f 001c43cb-3e9b-43db-b6d0-61e67d058c9f
0.03638 0.03638
Table continues below
001e0e3e-04bd-407a-b65f-d2636ee28886 0033fca4-2372-402f-8281-d204b0e7cb5f
0.03638 0.03638
Table continues below
0046795b-3d8b-4921-8d11-19e7c9ad6bc3 005A9931-5051-4739-AA85-86238410CEC4
0.03638 0.03638
Table continues below
00bdbfd9-ca96-4c34-b4c1-eae63818fa93 00FB68C5-7946-4E69-9019-4E8BF9EB6A94
0.03638 0.03638
00fd3d04-b48e-434e-8d25-0f0949e796cc 011132B0-CA1B-4F19-B338-050E69F2E2FC
0.03638 0.03638

[1] “submitter_id”

Variable submitter_id

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 0.04 %

Nº Categories = 2749

Table continues below
TCGA-02-0047 TCGA-02-0055 TCGA-02-2486 TCGA-04-1348 TCGA-04-1357
0.03638 0.03638 0.03638 0.03638 0.03638
TCGA-04-1362 TCGA-04-1364 TCGA-04-1514 TCGA-05-4249 TCGA-05-4250
0.03638 0.03638 0.03638 0.03638 0.03638

[1] “oct_embedded”

Variable oct_embedded

Nas ratio = 71.99 %

Nas ratio_2 = 0 %

Nas dif_ratio = -71.99 %

Main value % = 66.62 %

[min,max]=[ false , true ]

Values: true false

Nº Categories = 2

true false
66.62 33.38

[1] “is_ffpe”

Variable is_ffpe

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[1] “tissue_type”

Variable tissue_type

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[min,max]=[ Not Reported , Not Reported ]

Values: Not Reported

Nº Categories = 1

Not Reported
100

[1] “synchronous_malignancy”

Variable synchronous_malignancy

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 79.83 %

[min,max]=[ No , Yes ]

Values: Yes Not Reported No

Nº Categories = 3

No Not Reported Yes
79.83 19.84 0.33

[1] “ajcc_pathologic_stage”

Variable ajcc_pathologic_stage

Nas ratio = 28.7 %

Nas ratio_2 = 0 %

Nas dif_ratio = -28.7 %

Main value % = 16.28 %

[min,max]=[ Stage I , Stage IVC ]

Values: Stage IVC Stage IVB Stage IVA Stage IV Stage IIIC Stage IIIB Stage IIIA Stage III Stage IIC Stage IIB Stage IIA Stage II Stage IB Stage IA Stage I

Nº Categories = 15

Table continues below
Stage I Stage III Stage IIB Stage IV Stage II Stage IB
16.28 11.99 10.36 10.05 9.388 8.061
Stage IIIA Stage IVA Stage IIA Stage IA
7.908 7.806 6.684 5.357

[1] “days_to_diagnosis”

Variable days_to_diagnosis

Nas ratio = 3.97 %

Nas ratio_2 = 0 %

Nas dif_ratio = -3.97 %

Main value % = 100 %

[min,max]=[ 0 , 0 ]

Values: 0

Nº Categories = 1

0
100

[1] “treatments”

Variable treatments

Nas ratio = 59.38 %

Nas ratio_2 = 0 %

Nas dif_ratio = -59.38 %

Main value % = 15.38 %

Nº Categories = 16369

Table continues below
NOS released no Pharmaceutical Therapy Radiation Therapy
13.33 13.33 6.784 6.667 6.667
Table continues below
yes not reported 2019-07-31T15:12:53.693498-05:00
4.86 1.689 0.004889
2019-07-31T15:13:10.219711-05:00 2019-07-31T15:13:38.311641-05:00
0.004889 0.004889

[1] “last_known_disease_status”

Variable last_known_disease_status

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 100 %

[min,max]=[ not reported , not reported ]

Values: not reported

Nº Categories = 1

not reported
100

[1] “tissue_or_organ_of_origin”

Variable tissue_or_organ_of_origin

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 19.22 %

Nº Categories = 91

Table continues below
NOS Kidney lung Upper lobe Ovary Breast
28.07 11.62 9.734 5.942 4.634 3.725
Lower lobe Brain Prostate gland Cerebrum
3.503 3.37 2.461 2.306

[1] “days_to_last_follow_up”

Variable days_to_last_follow_up

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 28.05 %

[min,max]=[ -4170 , 7248 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
-4170 546 1095 1180.752 1470 7248

[1] “age_at_diagnosis”

Variable age_at_diagnosis

Nas ratio = 3.24 %

Nas ratio_2 = 0 %

Nas dif_ratio = -3.24 %

Main value % = 0.19 %

[min,max]=[ 5267 , 32872 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
5267 19382.75 22671.5 22375.26 25853.25 32872

[1] “primary_diagnosis”

Variable primary_diagnosis

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 19.25 %

Nº Categories = 92

Table continues below
NOS Squamous cell carcinoma Adenocarcinoma
40.95 10.85 9.116
Table continues below
Clear cell adenocarcinoma Serous cystadenocarcinoma
7.769 4.294
Table continues below
Infiltrating duct carcinoma Papillary adenocarcinoma Glioblastoma
3.377 2.499 2.323
Transitional cell carcinoma anaplastic
1.581 1.191

[1] “prior_malignancy”

Variable prior_malignancy

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 79.28 %

[min,max]=[ no , yes ]

Values: yes not reported no

Nº Categories = 3

no not reported yes
79.28 11.92 8.801

[1] “year_of_diagnosis”

Variable year_of_diagnosis

Nas ratio = 3.75 %

Nas ratio_2 = 0 %

Nas dif_ratio = -3.75 %

Main value % = 11.15 %

[min,max]=[ 1987 , 2013 ]

Values: 2013 2012 2011 2010 2009 2008 2007 2006 2005 2004 2003 2002 2001 2000 1999 1998 1997 1996 1995 1994 1993 1992 1991 1990 1987

Nº Categories = 25

Table continues below
2011 2010 2006 2007 2009 2008
11.15 9.486 8.617 8.239 8.088 7.861
2012 2005 2004 2003
7.37 7.143 6.576 4.762

[1] “prior_treatment”

Variable prior_treatment

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 98.46 %

[min,max]=[ No , Yes ]

Values: Yes No

Nº Categories = 2

No Yes
98.46 1.54

[1] “ajcc_pathologic_t”

Variable ajcc_pathologic_t

Nas ratio = 21.86 %

Nas ratio_2 = 0 %

Nas dif_ratio = -21.86 %

Main value % = 25.56 %

[min,max]=[ T0 , TX ]

Values: TX T4d T4b T4a T4 T3c T3b T3a T3 T2c T2b T2a2 T2a T2 T1c T1b2 T1b1 T1b T1a T1 T0

Nº Categories = 21

Table continues below
T2 T3 T3a T1 T1b T1a
25.56 18.95 9.451 6.983 6.378 6.052
T4a T3b T4 T2a
6.006 4.33 3.678 3.119

[1] “morphology”

Variable morphology

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 19.25 %

Nº Categories = 79

Table continues below
8070/3 8140/3 8310/3 8441/3 8500/3 8260/3
19.25 16.28 14.59 8.067 6.344 4.694
9440/3 8120/3 8317/3 8255/3
4.364 2.97 1.98 1.613

[1] “ajcc_clinical_m”

Variable ajcc_clinical_m

Nas ratio = 81.74 %

Nas ratio_2 = 0 %

Nas dif_ratio = -81.74 %

Main value % = 93.63 %

[min,max]=[ M0 , MX ]

Values: MX M1b M1 M0

Nº Categories = 4

M0 MX M1 M1b
93.63 3.984 2.191 0.1992

[1] “ajcc_pathologic_n”

Variable ajcc_pathologic_n

Nas ratio = 22.26 %

Nas ratio_2 = 0 %

Nas dif_ratio = -22.26 %

Main value % = 45.77 %

[min,max]=[ N0 , NX ]

Values: NX N3b N3a N3 N2c N2b N2a N2 N1mi N1c N1b N1a N1 N0 (i+) N0 (i-) N0

Nº Categories = 16

Table continues below
N0 NX N1 N2 N2b N1a
45.77 17.36 17.31 7.487 2.948 2.293
N3 N2c N3a N0 (i-)
1.778 1.638 0.9827 0.6083

[1] “classification_of_tumor”

Variable classification_of_tumor

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 100 %

[min,max]=[ not reported , not reported ]

Values: not reported

Nº Categories = 1

not reported
100

[1] “diagnosis_id”

Variable diagnosis_id

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 0.04 %

Nº Categories = 2727

Table continues below
00137f74-b3b0-54a4-bca0-9a1477f4a082 002c9efa-a79e-5691-9bb6-34eff2ea2c33
0.03667 0.03667
Table continues below
00595bd0-e968-554d-bfaa-dafdd251817c 008cf944-786b-581a-a969-d6b2fab187b3
0.03667 0.03667
Table continues below
00d350c8-1251-5563-956c-06ed409eefe0 00d455d1-fd97-5e93-9225-d982f0ad3780
0.03667 0.03667
Table continues below
00d4a2c7-fab2-52a0-91fe-ca6922d66a73 00e5e55f-e88e-5622-91c0-62c6a9426c9a
0.03667 0.03667
00f8ee1c-618f-530e-8d64-954aff8478aa 012f225f-1cb8-5962-a806-b05cca31ffd9
0.03667 0.03667

[1] “icd_10_code”

Variable icd_10_code

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 16.54 %

Nº Categories = 91

Table continues below
C64.9 C34.1 C56.9 C50.9 C34.3 C71.9
16.54 10.12 7.517 6.161 5.647 5.574
C61 C71.0 C64.1 C73
4.07 3.814 2.677 2.604

[1] “site_of_resection_or_biopsy”

Variable site_of_resection_or_biopsy

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 19.22 %

Nº Categories = 97

Table continues below
NOS Kidney lung Upper lobe Ovary Breast
27.84 11.64 9.756 5.956 4.511 3.733
Lower lobe Brain Prostate gland Cerebrum
3.511 3.378 2.467 2.311

[1] “tumor_grade”

Variable tumor_grade

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 100 %

[min,max]=[ not reported , not reported ]

Values: not reported

Nº Categories = 1

not reported
100

[1] “progression_or_recurrence”

Variable progression_or_recurrence

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 100 %

[min,max]=[ not reported , not reported ]

Values: not reported

Nº Categories = 1

not reported
100

[1] “alcohol_history”

Variable alcohol_history

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 87.42 %

[min,max]=[ No , Yes ]

Values: Yes Not Reported No

Nº Categories = 3

Not Reported Yes No
87.42 8.141 4.437

[1] “exposure_id”

Variable exposure_id

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 0.04 %

Nº Categories = 2727

Table continues below
00001051-e0ee-5249-9d57-1607d3cef8a0 00118399-52df-543b-b341-755bc688aa93
0.03667 0.03667
Table continues below
00633947-107a-5aa2-88cc-0f69f1e84921 006657eb-c3ec-50dc-a517-45e00d4ab917
0.03667 0.03667
Table continues below
00800dc3-f8a8-5787-9ed1-48e99fc6606b 009aadd9-13c8-593c-a526-e04025afe4f6
0.03667 0.03667
Table continues below
00dafcc3-64fa-560c-9fbd-18c3bba156a5 00f7640a-590a-5428-80c9-d8892f5f2ae0
0.03667 0.03667
0107d3dd-8088-5c38-8bb2-c5f29cf177d4 0108b070-da38-5ad2-94a6-d15ef5ee71ff
0.03667 0.03667

[1] “race”

Variable race

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 81.26 %

[min,max]=[ american indian or alaska native , white ]

Values: white not reported native hawaiian or other pacific islander black or african american asian american indian or alaska native

Nº Categories = 6

Table continues below
white not reported black or african american asian
81.26 7.811 7.151 3.63
american indian or alaska native native hawaiian or other pacific islander
0.11 0.03667

[1] “gender”

Variable gender

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 53.65 %

[min,max]=[ female , male ]

Values: male female

Nº Categories = 2

male female
53.65 46.35

[1] “ethnicity”

Variable ethnicity

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 74.26 %

[min,max]=[ hispanic or latino , not reported ]

Values: not reported not hispanic or latino hispanic or latino

Nº Categories = 3

not hispanic or latino not reported hispanic or latino
74.26 23.21 2.53

[1] “vital_status”

Variable vital_status

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 60.18 %

[min,max]=[ Alive , Dead ]

Values: Dead Alive

Nº Categories = 2

Dead Alive
60.18 39.82

[1] “age_at_index”

Variable age_at_index

Nas ratio = 2.26 %

Nas ratio_2 = 0 %

Nas dif_ratio = -2.26 %

Main value % = 3.87 %

[min,max]=[ 14 , 90 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
14 53 62 60.82248 70 90

[1] “days_to_birth”

Variable days_to_birth

Nas ratio = 3.24 %

Nas ratio_2 = 0 %

Nas dif_ratio = -3.24 %

Main value % = 0.19 %

[min,max]=[ -32872 , -5267 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
-32872 -25853.25 -22671.5 -22375.26 -19382.75 -5267

[1] “year_of_birth”

Variable year_of_birth

Nas ratio = 4.77 %

Nas ratio_2 = 0 %

Nas dif_ratio = -4.77 %

Main value % = 3.36 %

[min,max]=[ 1908 , 1995 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
1908 1936 1945 1945.914 1955 1995

[1] “demographic_id”

Variable demographic_id

Nas ratio = 0.8 %

Nas ratio_2 = 0 %

Nas dif_ratio = -0.8 %

Main value % = 0.04 %

Nº Categories = 2727

Table continues below
0006e7b4-8d78-5467-82ed-07654fd97ce4 001548ee-6514-5503-ada1-0105c21db6db
0.03667 0.03667
Table continues below
0077011e-a24a-53b9-a202-01b6e414df3a 008339c9-8305-5fc6-8c44-dde0fcb3b4ad
0.03667 0.03667
Table continues below
009ccb3c-781d-50c9-afa6-4ae885be125f 00b798ab-3977-58ff-ae2a-fceac37cc7f3
0.03667 0.03667
Table continues below
00b9f7ea-ee57-5c0f-81c9-0437761e4b58 00bd3937-6d32-59a5-b25e-91c44fa6cdf3
0.03667 0.03667
00c9288b-48ac-53a9-a482-09c92ab6d0e9 00d4de85-6831-5313-8493-4102bd43a904
0.03667 0.03667

[1] “days_to_death”

Variable days_to_death

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 41.07 %

[min,max]=[ 0 , 6425 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
0 0 113 398.9975 519 6425

[1] “year_of_death”

Variable year_of_death

Nas ratio = 63.62 %

Nas ratio_2 = 0 %

Nas dif_ratio = -63.62 %

Main value % = 10.6 %

[min,max]=[ 1992 , 2014 ]

Values: 2014 2013 2012 2011 2010 2009 2008 2007 2006 2005 2004 2003 2002 2001 2000 1999 1998 1997 1996 1995 1994 1993 1992

Nº Categories = 23

Table continues below
2008 2009 2006 2007 2010 2005 2004
10.6 10.3 8.5 8.4 8.1 7.7 7.4
2013 2003 2002
5.5 5.2 4.7

[1] “bcr_patient_barcode”

Variable bcr_patient_barcode

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 0.04 %

Nº Categories = 2749

Table continues below
TCGA-02-0047-01A TCGA-02-0055-01A TCGA-02-2486-01A TCGA-04-1348-01A
0.03638 0.03638 0.03638 0.03638
Table continues below
TCGA-04-1357-01A TCGA-04-1362-01A TCGA-04-1364-01A TCGA-04-1514-01A
0.03638 0.03638 0.03638 0.03638
TCGA-05-4249-01A TCGA-05-4250-01A
0.03638 0.03638

[1] “primary_site”

Variable primary_site

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 8.12 %

Nº Categories = 61

Table continues below
Kidney Bronchus and lung Bones Other and unspecified parts of tongue
7.247 6.603 4.158 4.016
Table continues below
joints and articular cartilage of other and unspecified sites oral cavity and pharynx Base of tongue
3.643 3.501 3.501
Floor of mouth Gum Hypopharynx
3.501 3.501 3.501

[1] “project_id”

Variable project_id

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 14.41 %

[min,max]=[ TCGA-ACC , TCGA-UVM ]

Values: TCGA-UVM TCGA-UCS TCGA-UCEC TCGA-THYM TCGA-THCA TCGA-TGCT TCGA-STAD TCGA-SKCM TCGA-SARC TCGA-READ TCGA-PRAD TCGA-PCPG TCGA-PAAD TCGA-OV TCGA-MESO TCGA-LUSC TCGA-LUAD TCGA-LIHC TCGA-LGG TCGA-KIRP TCGA-KIRC TCGA-KICH TCGA-HNSC TCGA-GBM TCGA-ESCA TCGA-DLBC TCGA-COAD TCGA-CHOL TCGA-CESC TCGA-BRCA

Nº Categories = 32

Table continues below
TCGA-KIRC TCGA-HNSC TCGA-LUSC TCGA-LUAD TCGA-OV TCGA-BRCA
14.41 9.895 9.603 8.258 7.603 6.148
TCGA-LGG TCGA-STAD TCGA-GBM TCGA-PRAD
5.056 4.402 4.365 4.038

[1] “disease_type”

Variable disease_type

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 24.98 %

[min,max]=[ Mucinous and Serous Neoplasms , Transitional Cell Papillomas and Carcinomas ]

Values: Transitional Cell Papillomas and Carcinomas Thymic Epithelial Neoplasms Synovial-like Neoplasms Squamous Cell Neoplasms Soft Tissue Tumors and Sarcomas Paragangliomas and Glomus Tumors Not Reported Nevi and Melanomas Nerve Sheath Tumors Myomatous Neoplasms Mesothelial Neoplasms Mature B-Cell Lymphomas Lipomatous Neoplasms Gliomas Germ Cell Neoplasms Fibromatous Neoplasms Fibroepithelial Neoplasms Epithelial Neoplasms Ductal and Lobular Neoplasms Cystic Complex Mixed and Stromal Neoplasms Complex Epithelial Neoplasms Basal Cell Neoplasms Adnexal and Skin Appendage Neoplasms Adenomas and Adenocarcinomas Acinar Cell Neoplasms NOS Mucinous and Serous Neoplasms

Nº Categories = 28

Table continues below
Adenomas and Adenocarcinomas Mucinous and Serous Neoplasms Cystic
19.93 13.44 13.44
Table continues below
Squamous Cell Neoplasms NOS Epithelial Neoplasms Not Reported
10.38 6.778 6.283 4.589
Ductal and Lobular Neoplasms Complex Epithelial Neoplasms Gliomas
4.23 3.389 3.203

[1] “name”

Variable name

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 14.41 %

[min,max]=[ Adrenocortical Carcinoma , Uveal Melanoma ]

Values: Uveal Melanoma Uterine Corpus Endometrial Carcinoma Uterine Carcinosarcoma Thyroid Carcinoma Thymoma Testicular Germ Cell Tumors Stomach Adenocarcinoma Skin Cutaneous Melanoma Sarcoma Rectum Adenocarcinoma Prostate Adenocarcinoma Pheochromocytoma and Paraganglioma Pancreatic Adenocarcinoma Ovarian Serous Cystadenocarcinoma Mesothelioma Lymphoid Neoplasm Diffuse Large B-cell Lymphoma Lung Squamous Cell Carcinoma Lung Adenocarcinoma Liver Hepatocellular Carcinoma Kidney Renal Papillary Cell Carcinoma Kidney Renal Clear Cell Carcinoma Kidney Chromophobe Head and Neck Squamous Cell Carcinoma Glioblastoma Multiforme Esophageal Carcinoma Colon Adenocarcinoma Cholangiocarcinoma Cervical Squamous Cell Carcinoma and Endocervical Adenocarcinoma Breast Invasive Carcinoma Brain Lower Grade Glioma

Nº Categories = 32

Table continues below
Kidney Renal Clear Cell Carcinoma Head and Neck Squamous Cell Carcinoma
14.41 9.895
Table continues below
Lung Squamous Cell Carcinoma Lung Adenocarcinoma Ovarian Serous Cystadenocarcinoma
9.603 8.258 7.603
Table continues below
Breast Invasive Carcinoma Brain Lower Grade Glioma Stomach Adenocarcinoma
6.148 5.056 4.402
Glioblastoma Multiforme Prostate Adenocarcinoma
4.365 4.038

[1] “releasable”

Variable releasable

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[1] “released”

Variable released

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 100 %

[1] “ajcc_staging_system_edition”

Variable ajcc_staging_system_edition

Nas ratio = 41.58 %

Nas ratio_2 = 0 %

Nas dif_ratio = -41.58 %

Main value % = 49.63 %

[min,max]=[ 2nd , 7th ]

Values: 7th 6th 5th 4th 3rd 2nd

Nº Categories = 6

7th 6th 5th 4th 3rd 2nd
49.63 44.15 5.106 0.5604 0.4359 0.1245

[1] “ajcc_pathologic_m”

Variable ajcc_pathologic_m

Nas ratio = 33.65 %

Nas ratio_2 = 0 %

Nas dif_ratio = -33.65 %

Main value % = 74.89 %

[min,max]=[ cM0 (i+) , MX ]

Values: MX M1b M1a M1 M0 cM0 (i+)

Nº Categories = 6

M0 MX M1 M1b M1a cM0 (i+)
74.89 16.67 7.95 0.2741 0.1645 0.05482

[1] “ajcc_clinical_t”

Variable ajcc_clinical_t

Nas ratio = 82.39 %

Nas ratio_2 = 0 %

Nas dif_ratio = -82.39 %

Main value % = 23.14 %

[min,max]=[ T1 , TX ]

Values: TX T4d T4b T4a T4 T3b T3a T3 T2c T2b T2a T2 T1c T1b T1a T1

Nº Categories = 16

Table continues below
T2 T4a T3 T1c T3a T2b
23.14 19.83 19.63 9.298 4.959 4.752
T1 T2c T2a T1a
4.545 3.306 2.686 2.479

[1] “cigarettes_per_day”

Variable cigarettes_per_day

Nas ratio = 76.32 %

Nas ratio_2 = 0 %

Nas dif_ratio = -76.32 %

Main value % = 11.67 %

[min,max]=[ 0.008219178 , 10.9589 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
0.0082192 1.369863 2.191781 2.467125 3.287671 10.9589

[1] “pack_years_smoked”

Variable pack_years_smoked

Nas ratio = 76.32 %

Nas ratio_2 = 0 %

Nas dif_ratio = -76.32 %

Main value % = 11.67 %

[min,max]=[ 0.15 , 200 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
0.15 25 40 45.02504 60 200

[1] “days_to_sample_procurement”

Variable days_to_sample_procurement

Nas ratio = 100 %

Nas ratio_2 = 0 %

Nas dif_ratio = -100 %

Main value % = NA %

[1] “preservation_method”

Variable preservation_method

Nas ratio = 100 %

Nas ratio_2 = 0 %

Nas dif_ratio = -100 %

Main value % = NA %

[1] “figo_stage”

Variable figo_stage

Nas ratio = 90.36 %

Nas ratio_2 = 0 %

Nas dif_ratio = -90.36 %

Main value % = 59.25 %

[min,max]=[ Stage I , Stage IVB ]

Values: Stage IVB Stage IVA Stage IV Stage IIIC2 Stage IIIC1 Stage IIIC Stage IIIB Stage IIIA Stage III Stage IIC Stage IIB Stage IIA2 Stage IIA Stage II Stage IB2 Stage IB1 Stage IB Stage IA Stage I

Nº Categories = 19

Table continues below
Stage IIIC Stage IV Stage IIIB Stage IB Stage IIC Stage IIIA
59.25 10.19 4.906 3.396 3.396 3.396
Stage IIB Stage IVB Stage IB1 Stage IA
2.264 2.264 1.887 1.509

[1] “intermediate_dimension”

Variable intermediate_dimension

Nas ratio = 29.54 %

Nas ratio_2 = 0 %

Nas dif_ratio = -29.54 %

Main value % = 16.21 %

[min,max]=[ 0 , 3 ]

Values: 3 2 1 0

Nº Categories = 26

Table continues below
1 0.8 0.6 0.7 0.9 0.5
16.21 14.15 11.98 10.69 10.38 7.331
0.4 1.2 1.3 1.5
6.092 3.769 3.407 3.098

[1] “shortest_dimension”

Variable shortest_dimension

Nas ratio = 29.54 %

Nas ratio_2 = 0 %

Nas dif_ratio = -29.54 %

Main value % = 24.21 %

[min,max]=[ 0 , 1 ]

Values: 1 0

Nº Categories = 13

Table continues below
0.3 0.4 0.2 0.5 0.6 0.1
24.21 21.99 15.28 15.07 7.486 4.027
0.7 0.8 0.9 1
3.924 3.665 2.323 1.033

[1] “longest_dimension”

Variable longest_dimension

Nas ratio = 29.54 %

Nas ratio_2 = 0 %

Nas dif_ratio = -29.54 %

Main value % = 15.38 %

[min,max]=[ 0 , 4 ]

Values: 4 3 2 1 0

Nº Categories = 38

Table continues below
1 1.5 1.2 2 1.3 0.9
15.38 9.241 7.383 6.247 6.04 5.834
1.1 0.8 1.4 0.7
5.576 5.318 4.337 4.027

[1] “ann_arbor_clinical_stage”

Variable ann_arbor_clinical_stage

Nas ratio = 99.64 %

Nas ratio_2 = 0 %

Nas dif_ratio = -99.64 %

Main value % = 40 %

[min,max]=[ Stage I , Stage IV ]

Values: Stage IV Stage III Stage II Stage I

Nº Categories = 4

Stage IV Stage I Stage II Stage III
40 20 20 20

[1] “ann_arbor_extranodal_involvement”

Variable ann_arbor_extranodal_involvement

Nas ratio = 99.6 %

Nas ratio_2 = 0 %

Nas dif_ratio = -99.6 %

Main value % = 54.55 %

[min,max]=[ No , Yes ]

Values: Yes No

Nº Categories = 2

No Yes
54.55 45.45

[1] “ann_arbor_b_symptoms”

Variable ann_arbor_b_symptoms

Nas ratio = 99.6 %

Nas ratio_2 = 0 %

Nas dif_ratio = -99.6 %

Main value % = 72.73 %

[min,max]=[ No , Yes ]

Values: Yes No

Nº Categories = 2

No Yes
72.73 27.27

[1] “sample.aux”

Variable sample.aux

Nas ratio = 88.91 %

Nas ratio_2 = 0 %

Nas dif_ratio = -88.91 %

Main value % = 0.33 %

Nº Categories = 305

Table continues below
TCGA-04-1348-01 TCGA-04-1357-01 TCGA-04-1362-01 TCGA-04-1364-01
0.3279 0.3279 0.3279 0.3279
Table continues below
TCGA-04-1514-01 TCGA-09-0364-01 TCGA-09-0366-01 TCGA-09-0367-01
0.3279 0.3279 0.3279 0.3279
TCGA-09-0369-01 TCGA-09-1659-01
0.3279 0.3279

[1] “ajcc_clinical_stage”

Variable ajcc_clinical_stage

Nas ratio = 87.74 %

Nas ratio_2 = 0 %

Nas dif_ratio = -87.74 %

Main value % = 40.65 %

[min,max]=[ Stage I , Stage IVC ]

Values: Stage IVC Stage IVB Stage IVA Stage IV Stage IIIB Stage IIIA Stage III Stage IIB Stage IIA Stage II Stage IA Stage I

Nº Categories = 12

Table continues below
Stage IVA Stage III Stage II Stage I Stage IIIA Stage IV
40.65 20.77 17.21 9.199 2.374 2.374
Stage IVB Stage IIA Stage IIB Stage IVC
2.374 1.484 1.484 1.484

[1] “ajcc_clinical_n”

Variable ajcc_clinical_n

Nas ratio = 87.6 %

Nas ratio_2 = 0 %

Nas dif_ratio = -87.6 %

Main value % = 47.51 %

[min,max]=[ N0 , NX ]

Values: NX N3 N2c N2b N2a N2 N1 N0

Nº Categories = 8

Table continues below
N0 N1 N2b N2c NX N2
47.51 19.06 12.32 7.331 5.572 4.106
N2a N3
2.053 2.053

[1] “years_smoked”

Variable years_smoked

Nas ratio = 89.63 %

Nas ratio_2 = 0 %

Nas dif_ratio = -89.63 %

Main value % = 11.58 %

[min,max]=[ 2 , 64 ]

Values: 64 63 61 60 59 57 56 55 54 53 52 51 50 49 48 47 46 45 44 43 42 41 40 39 38 37 36 35 34 33

Nº Categories = 57

Table continues below
40 20 50 30 45 35
11.58 9.474 7.719 6.667 4.211 3.86
25 41 37 15
3.158 3.158 2.807 2.456

[1] “secondary_gleason_grade”

Variable secondary_gleason_grade

Nas ratio = 95.96 %

Nas ratio_2 = 0 %

Nas dif_ratio = -95.96 %

Main value % = 48.65 %

[min,max]=[ Pattern 3 , Pattern 5 ]

Values: Pattern 5 Pattern 4 Pattern 3

Nº Categories = 3

Pattern 4 Pattern 3 Pattern 5
48.65 35.14 16.22

[1] “primary_gleason_grade”

Variable primary_gleason_grade

Nas ratio = 95.96 %

Nas ratio_2 = 0 %

Nas dif_ratio = -95.96 %

Main value % = 47.75 %

[min,max]=[ Pattern 3 , Pattern 5 ]

Values: Pattern 5 Pattern 4 Pattern 3

Nº Categories = 3

Pattern 3 Pattern 4 Pattern 5
47.75 45.95 6.306

[1] “igcccg_stage”

Variable igcccg_stage

Nas ratio = 99.96 %

Nas ratio_2 = 0 %

Nas dif_ratio = -99.96 %

Main value % = 100 %

[min,max]=[ Good Prognosis , Good Prognosis ]

Values: Good Prognosis

Nº Categories = 1

Good Prognosis
100

[1] “masaoka_stage”

Variable masaoka_stage

Nas ratio = 99.85 %

Nas ratio_2 = 0 %

Nas dif_ratio = -99.85 %

Main value % = 50 %

[min,max]=[ Stage I , Stage III ]

Values: Stage III Stage IIb Stage I

Nº Categories = 3

Stage IIb Stage I Stage III
50 25 25

[1] “dead_in_year”

Variable dead_in_year

Nas ratio = 50.56 %

Nas ratio_2 = 0 %

Nas dif_ratio = -50.56 %

Main value % = 99.93 %

[min,max]=[ 0 , 1 ]

Values: 1 0

Nº Categories = 2

0 1
99.93 0.07358

[1] “index”

Variable index

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 0.04 %

[min,max]=[ 7 , 9837 ]

Min. 1st Qu. Median Mean 3rd Qu. Max.
7 3061 4481 4806.553 6604 9837

[1] “target”

Variable target

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 51.69 %

[min,max]=[ 0 , 1 ]

Values: 1 0

Nº Categories = 2

0 1
51.69 48.31

[1] “dataset”

Variable dataset

Nas ratio = 0 %

Nas ratio_2 = 0 %

Nas dif_ratio = 0 %

Main value % = 69.08 %

[min,max]=[ test , val ]

Values: val train test

Nº Categories = 3

train test val
69.08 16.81 14.11